bash run_pretrain_megatron_qwen_multi_node.sh  \
dsw  \
../../ \
7B   \
8    \
512 \
5e-5   \
1e-6   \
1024  \
1024  \
293   \
fp16  \
2   \
2  \
sel  \
true   \
false  \
false   \
false   \
20000000  \
/gemini/platform/public/datasets/wudao_test/bin_data/wudao_qwenbpe_content_document  \
/gemini/platform/public/llm/huggingface/Qwen/Qwen1.5-7B-Chat-megatron-tp2-pp2  \
19660395   \
0   \
/gemini/platform/public/users/daoguang/megatron_ckpts/Qwen1.5-7B-megatron-tp2-pp2-24.4.24-debug